library(haven)
Data <- read.csv("/media/empro/5C02C2EB02C2C8EA/Ubuntu/Fendler/ovaryAnalysis/processed.csv", header = TRUE)
#View(Data)
Labels <- Data[c(1)]
Data <- Data[-c(1)]

zbadamy macierz korelacji

corMatrix <- cor(Data, method = 'spearman')
#heatm <- heatmap(corMatrix)
heatm <- heatmap(corMatrix, Rowv = NA, Colv = NA)

Mediany

library(data.table)
data.table 1.10.4.3
  The fastest way to learn (by data.table authors): https://www.datacamp.com/courses/data-analysis-the-data-table-way
  Documentation: ?data.table, example(data.table) and browseVignettes("data.table")
  Release notes, videos and slides: http://r-datatable.com
View(Labels)

Sprawdz dystrybucje

library(ggplot2)
for(colmn in Data)
{
  hist(colmn)
}

toM <- subset(Data, Labels[c(1)] == 'can')
#View(toM)
#toM <- setDT(Data, key=Labels)['can']

policz mediane

names <- c()
meds <- c()
ps <- c()
for(i in 1:ncol(toM))
{
  med = median(toM[, i])
  #print(median(as.numeric(as.vector(toM[c(i)]))) )
  name = colnames(toM)[i]
  p = wilcox.test(Data[, i] ~ Labels[, 1])$p.value
  
  #cat("Nazwa: ", name, "  mediana: ", med, "  p: ", p, "\n")
  
  names <- c(names, name)
  meds <- c(meds, med)
  ps <- c(ps, p)
}
#meds <- log2(meds)
volData = data.frame(names, meds, ps)
#View(head(volData, n=10) )
volData <- volData[order(volData$ps),]
View(head(volData, n=10) )

Beniamini-Hochberg Procedure - NOPE FDR

bh = p.adjust(volData$ps, method = 'fdr')
#View(head(bh, n=10))
volData <- data.frame(volData, bh)
View(head(volData, n=10))

Rysujemy piękny volcanoPlot

library(dplyr)

Attaching package: ‘dplyr’

The following objects are masked from ‘package:data.table’:

    between, first, last

The following objects are masked from ‘package:stats’:

    filter, lag

The following objects are masked from ‘package:base’:

    intersect, setdiff, setequal, union
library(ggplot2)
View(volData)
drawRes = mutate(volData, sig=ifelse(volData$bh < 0.05, 'FDR<0.05', 'Not Sig'))
volPlo = ggplot(drawRes, aes(meds, -log10(ps))) + geom_point(aes(col=sig)) + scale_color_manual(values = c('red', 'black'))
#0volPlo <- volPlo + geom_text(data=filter(drawRes, bh<0.05), aes(label=names))
volPlo <- volPlo + scale_x_continuous(limits = c(-2, 2))
volPlo

move labels

library(ggrepel)

volPlo <- volPlo + geom_text_repel(data=filter(drawRes, bh < 0.05), aes(label=names))
volPlo

Machine Learning

LS0tCnRpdGxlOiAiUiBOb3RlYm9vayIKb3V0cHV0OiBodG1sX25vdGVib29rCi0tLQoKYGBge3J9CmxpYnJhcnkoaGF2ZW4pCkRhdGEgPC0gcmVhZC5jc3YoIi9tZWRpYS9lbXByby81QzAyQzJFQjAyQzJDOEVBL1VidW50dS9GZW5kbGVyL292YXJ5QW5hbHlzaXMvcHJvY2Vzc2VkLmNzdiIsIGhlYWRlciA9IFRSVUUpCiNWaWV3KERhdGEpCmBgYApgYGB7cn0KTGFiZWxzIDwtIERhdGFbYygxKV0KRGF0YSA8LSBEYXRhWy1jKDEpXQpgYGAKCnpiYWRhbXkgbWFjaWVyeiBrb3JlbGFjamkgCmBgYHtyfQpjb3JNYXRyaXggPC0gY29yKERhdGEsIG1ldGhvZCA9ICdzcGVhcm1hbicpCmBgYAoKYGBge3J9CiNoZWF0bSA8LSBoZWF0bWFwKGNvck1hdHJpeCkKaGVhdG0gPC0gaGVhdG1hcChjb3JNYXRyaXgsIFJvd3YgPSBOQSwgQ29sdiA9IE5BKQpgYGAKTWVkaWFueQpgYGB7cn0KbGlicmFyeShkYXRhLnRhYmxlKQpWaWV3KExhYmVscykKYGBgClNwcmF3ZHogZHlzdHJ5YnVjamUKYGBge3J9CmxpYnJhcnkoZ2dwbG90MikKCmZvcihjb2xtbiBpbiBEYXRhKQp7CiAgaGlzdChjb2xtbikKfQpgYGAKCmBgYHtyfQp0b00gPC0gc3Vic2V0KERhdGEsIExhYmVsc1tjKDEpXSA9PSAnY2FuJykKI1ZpZXcodG9NKQojdG9NIDwtIHNldERUKERhdGEsIGtleT1MYWJlbHMpWydjYW4nXQpgYGAKcG9saWN6IG1lZGlhbmUKYGBge3J9Cm5hbWVzIDwtIGMoKQptZWRzIDwtIGMoKQpwcyA8LSBjKCkKZm9yKGkgaW4gMTpuY29sKHRvTSkpCnsKICBtZWQgPSBtZWRpYW4odG9NWywgaV0pCiAgI3ByaW50KG1lZGlhbihhcy5udW1lcmljKGFzLnZlY3Rvcih0b01bYyhpKV0pKSkgKQogIG5hbWUgPSBjb2xuYW1lcyh0b00pW2ldCiAgcCA9IHdpbGNveC50ZXN0KERhdGFbLCBpXSB+IExhYmVsc1ssIDFdKSRwLnZhbHVlCiAgCiAgI2NhdCgiTmF6d2E6ICIsIG5hbWUsICIgIG1lZGlhbmE6ICIsIG1lZCwgIiAgcDogIiwgcCwgIlxuIikKICAKICBuYW1lcyA8LSBjKG5hbWVzLCBuYW1lKQogIG1lZHMgPC0gYyhtZWRzLCBtZWQpCiAgcHMgPC0gYyhwcywgcCkKfQoKYGBgCmBgYHtyfQojbWVkcyA8LSBsb2cyKG1lZHMpCnZvbERhdGEgPSBkYXRhLmZyYW1lKG5hbWVzLCBtZWRzLCBwcykKI1ZpZXcoaGVhZCh2b2xEYXRhLCBuPTEwKSApCgp2b2xEYXRhIDwtIHZvbERhdGFbb3JkZXIodm9sRGF0YSRwcyksXQpWaWV3KGhlYWQodm9sRGF0YSwgbj0xMCkgKQpgYGAKCkJlbmlhbWluaS1Ib2NoYmVyZyBQcm9jZWR1cmUgLSBOT1BFCkZEUgpgYGB7cn0KYmggPSBwLmFkanVzdCh2b2xEYXRhJHBzLCBtZXRob2QgPSAnZmRyJykKCiNWaWV3KGhlYWQoYmgsIG49MTApKQoKdm9sRGF0YSA8LSBkYXRhLmZyYW1lKHZvbERhdGEsIGJoKQoKVmlldyhoZWFkKHZvbERhdGEsIG49MTApKQpgYGAKClJ5c3VqZW15IHBpxJlrbnkgdm9sY2Fub1Bsb3QKYGBge3J9CmxpYnJhcnkoZHBseXIpCmxpYnJhcnkoZ2dwbG90MikKYGBgCgpgYGB7cn0KVmlldyh2b2xEYXRhKQpgYGAKCmBgYHtyfQpkcmF3UmVzID0gbXV0YXRlKHZvbERhdGEsIHNpZz1pZmVsc2Uodm9sRGF0YSRiaCA8IDAuMDUsICdGRFI8MC4wNScsICdOb3QgU2lnJykpCgp2b2xQbG8gPSBnZ3Bsb3QoZHJhd1JlcywgYWVzKG1lZHMsIC1sb2cxMChwcykpKSArIGdlb21fcG9pbnQoYWVzKGNvbD1zaWcpKSArIHNjYWxlX2NvbG9yX21hbnVhbCh2YWx1ZXMgPSBjKCdyZWQnLCAnYmxhY2snKSkKCiMwdm9sUGxvIDwtIHZvbFBsbyArIGdlb21fdGV4dChkYXRhPWZpbHRlcihkcmF3UmVzLCBiaDwwLjA1KSwgYWVzKGxhYmVsPW5hbWVzKSkKCnZvbFBsbyA8LSB2b2xQbG8gKyBzY2FsZV94X2NvbnRpbnVvdXMobGltaXRzID0gYygtMiwgMikpCgp2b2xQbG8KYGBgCgptb3ZlIGxhYmVscwpgYGB7cn0KbGlicmFyeShnZ3JlcGVsKQoKdm9sUGxvIDwtIHZvbFBsbyArIGdlb21fdGV4dF9yZXBlbChkYXRhPWZpbHRlcihkcmF3UmVzLCBiaCA8IDAuMDUpLCBhZXMobGFiZWw9bmFtZXMpKQp2b2xQbG8KYGBgCgoKCk1hY2hpbmUgTGVhcm5pbmc=